0 # initial state
(0,0,'!r',ConstantRewardFunction(0))
(0,1,'r',ConstantRewardFunction(1))
(1,1,'True',ConstantRewardFunction(0))
